num_hidden_layer: 3
hidden_dim: 16
learning_rate: 0.005
num_epochs: 500
l2_coeff: 0.0005
dropout_rate: 0.1
x_l1_coeff: 0.05
x_ent_coeff: 0.1
edge_l1_coeff: 0.005
edge_ent_coeff: 0.01
